# packages install stage
FROM jupyter/datascience-notebook

RUN pip config set global.index-url https://pypi.tuna.tsinghua.edu.cn/simple
RUN pip config set install.trusted-host pypi.tuna.tsinghua.edu.cn

# install requirements
RUN pip install langchain tiktoken python-dotenv requests docarray
RUN pip install transformers openai langchain-openai datasets pandas torch huggingface-hub
# install pydantic 1.10.13 to avoid pydantic:ValidationError
RUN pip uninstall -y pydantic && pip install pydantic==1.10.13

# for milvus client sdk
RUN pip install pymilvus==2.3.0

# RUN pip install TensorFlow tokenizers gpt2
RUN pip install unstructured markdown
RUN pip install --user -U nltk
RUN pip install lancedb beautifulsoup4
RUN pip install neo4j pyvis

# https://zhuanlan.zhihu.com/p/657220815
#RUN apt-get update -y && apt-get upgrade -y 
# RUN apt install git && apt-get install git-lfs


# cd docker-jupyter
# docker build -t jupyter-langchain .
# docker run -it -p 8888:8888 -v "${PWD}"/workspace:/home/jovyan/work --name jupyter-langchain jupyter-langchain:0.0.3
